import jieba
import json
from tqdm import tqdm


def main():
    SOURCE_INDEX_DATA_PATH = "../corpus/baike_qa/baike_qa_train.json"
    DIC_DATA = 'baike_qa_dic_2w'

    with open(SOURCE_INDEX_DATA_PATH, encoding="utf8") as f:
        for line in f:
            text = json.loads(line.strip())
            content = text['title'] + ' ' + text['desc'] + ' ' + text['answer']



if __name__ == '__main__':
    main()
